Fragestellung: “Die Manschafft, die zur Halbzeit vorne liegt, gewinnt mit einer 75% Chance auch das Spiel. Falls zur Halbzeit unentschieden ist, gewinnt eher das Heimteam.”
Dafür nehmen wir den Datacamp Datensatz Soccer Data
Als Einführung werden wir auf Datacamp folgende Kurse durchgehen:
# Bibliotheken importieren
library("plotly")
library("plyr")
library("dplyr")
# List files in Data folder
files <- list.files(path="./Data/", pattern=NULL, all.files=FALSE, full.names=TRUE)
# Create DataFrame with all csv from 2015-2019
df <- ldply(.data = files, .fun = read.csv)
# View entire DataFrame in R Studio
#View(df)
group_by_referee <- aggregate(
x = df$Referee,
by = list(df$Referee),
FUN = function(x) length(unique(x)))
htr_table <- df %>%
count(HTR)
ftr_table <- df %>%
count(FTR)
Results = c("Away", "Draw", "Home")
HT_count <- c(htr_table$n)
FT_count <- c(ftr_table$n)
df_results <- data.frame(Results, HT_count, FT_count)
fig <- plot_ly(
df_results, x = ~Results, y = ~HT_count, type = 'bar', name = 'Half Time Score') %>%
add_trace(y = ~FT_count, name = 'Full Time Score') %>%
layout(yaxis = list(title = 'Count'), barmode = 'group')
fig
NA
LS0tDQp0aXRsZTogIkRhdGF2aXogbWl0IFBsb3RseSBQTCBEYXRhIg0Kb3V0cHV0OiBodG1sX25vdGVib29rDQotLS0NCg0KIyMgRnJhZ2VzdGVsbHVuZzogIkRpZSBNYW5zY2hhZmZ0LCBkaWUgenVyIEhhbGJ6ZWl0IHZvcm5lIGxpZWd0LCBnZXdpbm50IG1pdCBlaW5lciA3NSUgQ2hhbmNlIGF1Y2ggZGFzIFNwaWVsLiBGYWxscyB6dXIgSGFsYnplaXQgdW5lbnRzY2hpZWRlbiBpc3QsIGdld2lubnQgZWhlciBkYXMgSGVpbXRlYW0uIg0KDQoNCkRhZsO8ciBuZWhtZW4gd2lyIGRlbiBEYXRhY2FtcCBEYXRlbnNhdHogW1NvY2NlciBEYXRhXShodHRwczovL2FwcC5kYXRhY2FtcC5jb20vd29ya3NwYWNlL2RhdGFzZXRzL2RhdGFzZXQtcHl0aG9uLXNvY2NlcikNCg0KQWxzIEVpbmbDvGhydW5nIHdlcmRlbiB3aXIgYXVmIERhdGFjYW1wIGZvbGdlbmRlIEt1cnNlIGR1cmNoZ2VoZW46DQoNCi0gW0ludGVyYWN0aXZlIERhdGEgVmlzdWFsaXphdGlvbiB3aXRoIHBsb3RseV0oaHR0cHM6Ly9hcHAuZGF0YWNhbXAuY29tL2xlYXJuL2NvdXJzZXMvaW50ZXJhY3RpdmUtZGF0YS12aXN1YWxpemF0aW9uLXdpdGgtcGxvdGx5LWluLXIpDQoNCi0gW0ludGVybWVkaWF0ZSBJbnRlcmFjdGl2ZSBEYXRhIFZpc3VhbGl6YXRpb24gd2l0aCBwbG90bHldKGh0dHBzOi8vYXBwLmRhdGFjYW1wLmNvbS9sZWFybi9jb3Vyc2VzL2ludGVyYWN0aXZlLWRhdGEtdmlzdWFsaXphdGlvbi13aXRoLXBsb3RseS1pbi1yKQ0KDQpgYGB7cn0NCiMgQmlibGlvdGhla2VuIGltcG9ydGllcmVuDQpsaWJyYXJ5KCJwbG90bHkiKQ0KbGlicmFyeSgicGx5ciIpDQpsaWJyYXJ5KCJkcGx5ciIpDQpgYGANCg0KYGBge3J9DQojIExpc3QgZmlsZXMgaW4gRGF0YSBmb2xkZXINCmZpbGVzIDwtIGxpc3QuZmlsZXMocGF0aD0iLi9EYXRhLyIsIHBhdHRlcm49TlVMTCwgYWxsLmZpbGVzPUZBTFNFLCBmdWxsLm5hbWVzPVRSVUUpDQoNCiMgQ3JlYXRlIERhdGFGcmFtZSB3aXRoIGFsbCBjc3YgZnJvbSAyMDE1LTIwMTkNCmRmIDwtIGxkcGx5KC5kYXRhID0gZmlsZXMsIC5mdW4gPSByZWFkLmNzdikNCg0KIyBWaWV3IGVudGlyZSBEYXRhRnJhbWUgaW4gUiBTdHVkaW8NCiNWaWV3KGRmKQ0KDQpgYGANCg0KYGBge3J9DQpncm91cF9ieV9yZWZlcmVlIDwtIGFnZ3JlZ2F0ZSgNCiAgICAgICAgICAgICAgICAgICAgeCA9IGRmJFJlZmVyZWUsDQogICAgICAgICAgICAgICAgICAgIGJ5ID0gbGlzdChkZiRSZWZlcmVlKSwNCiAgICAgICAgICAgICAgICAgICAgRlVOID0gZnVuY3Rpb24oeCkgbGVuZ3RoKHVuaXF1ZSh4KSkpDQpgYGANCg0KYGBge3J9DQpodHJfdGFibGUgPC0gZGYgJT4lDQoJY291bnQoSFRSKQ0KDQpmdHJfdGFibGUgPC0gZGYgJT4lDQoJY291bnQoRlRSKQ0KDQpSZXN1bHRzID0gYygiQXdheSIsICJEcmF3IiwgIkhvbWUiKQ0KSFRfY291bnQgPC0gYyhodHJfdGFibGUkbikNCkZUX2NvdW50IDwtIGMoZnRyX3RhYmxlJG4pDQoNCmRmX3Jlc3VsdHMgPC0gZGF0YS5mcmFtZShSZXN1bHRzLCBIVF9jb3VudCwgRlRfY291bnQpDQoNCmZpZyA8LSBwbG90X2x5KA0KICBkZl9yZXN1bHRzLCB4ID0gflJlc3VsdHMsIHkgPSB+SFRfY291bnQsIHR5cGUgPSAnYmFyJywgbmFtZSA9ICdIYWxmIFRpbWUgU2NvcmUnKSAlPiUgDQogIGFkZF90cmFjZSh5ID0gfkZUX2NvdW50LCBuYW1lID0gJ0Z1bGwgVGltZSBTY29yZScpICU+JQ0KICBsYXlvdXQoeWF4aXMgPSBsaXN0KHRpdGxlID0gJ0NvdW50JyksIGJhcm1vZGUgPSAnZ3JvdXAnKQ0KDQpmaWcNCg0KYGBgDQo=